export VLLM_ENGINE_ITERATION_TIMEOUT_S=36000
export VLLM_RPC_TIMEOUT=36000000

vllm serve "/home/corex/wj/QVQ-72B-Preview/" --served_model_name "qvq72b" -tp 8 --max-model-len $[8*1024] --disable_log_stats --trust-remote-code --host 0.0.0.0 --port 8000
